# 导包
import numpy as np
import pandas as pd

# todo 1、定义函数 data_preprocessing() ,对数据做预处理操作
def data_preprocessing(path):
    """
    思路：
        1:
        2:
        3:
        4:
    :return:
    """
    data = pd.read_csv(path)
    data.drop_duplicates(inplace=True)
    return data


if __name__ == '__main__':
    data_preprocessing("../data/test2.csv")
    data_preprocessing("../data/train.csv")